This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.

Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Ctrl+Shift+Enter.

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Ctrl+Alt+I.

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Ctrl+Shift+K to preview the HTML file).

The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike Knit, Preview does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed.

library(tidyverse)
# install for visualizations 
library(ggplot2)
# install to combine date and time
library(lubridate)

wego <- read_csv("../data/Route 50 Timepoint and Headway Data, 1-1-2023 through 5-12-2025.csv")
wego
# Create new date time column
wego$DATE_TIME <- ymd(wego$DATE) + hms(wego$SCHEDULED_TIME)

# Examine Data
wego


# Filter February TSP values
feb3_10_tsp <- wego |> 
  filter(between(DATE_TIME, 
                 as.Date("2025-02-03 12:00:00"), 
                 as.Date("2025-02-10 12:00:00")))

# Filter Feb-Apr TSP with busses only 2 minutes late or more
feb10_apr28_tsp <- wego |> 
  filter(between(DATE_TIME, 
                 as.Date("2025-02-10 12:00:00"), 
                 as.Date("2025-04-28 12:00:00"))) |> 
  filter(ADHERENCE <= -2)

# Filter May TSP values
may5_12_tsp <- wego |> 
  filter(between(DATE_TIME, 
                 as.Date("2025-05-05 12:00:00"), 
                 as.Date("2025-05-12 12:00:00")))

  

# Add day of week column
wego <- wego |>
  mutate(
    DATE_TIME = as.POSIXct(DATE_TIME),
    DAY_OF_WEEK = wday(DATE_TIME, 
                       label = TRUE, 
                       abbr = FALSE))

wego
NA

# Combine tsp variables into one 
tsp_rows <- bind_rows(
  feb3_10_tsp,
  feb10_apr28_tsp,
  may5_12_tsp
) |> 
  select('ADHERENCE_ID', 'DATE_TIME') |> 
  distinct() |> 
  mutate(tsp = 1)  # Add tsp indicator column for each distinct adherence id

wego <- wego |> 
  left_join(
    tsp_rows,
    by = c('ADHERENCE_ID', 'DATE_TIME')
  ) |> 
  mutate(tsp = coalesce(tsp, 0))

wego |> view()

wego <- wego |>  mutate(
  tsp_indicator = if_else(
    between(DATE_TIME, 
            as.Date("2025-02-03 12:00:00"), 
            as.Date("2025-02-10 12:00:00")) |
    (between(DATE_TIME, 
            as.Date("2025-02-10 12:00:00"), 
            as.Date("2025-04-28 12:00:00")) &
       ADHERENCE <= -2) |
    between(DATE_TIME, 
            as.Date("2025-05-05 12:00:00"), 
            as.Date("2025-05-12 12:00:00")), 1, 0)
    
  )

wego
NA
wego <- wego |> mutate(
  HOUR = hms(SCHEDULED_TIME) |> 
    hour()
  )

wego <- wego |>
  mutate(
    time_of_day = case_when(
      between(HOUR, 4, 5) ~ "early_morning",
      between(HOUR, 6, 8) ~ "morning_peak",
      between(HOUR, 9, 14) ~ "midday",
      between(HOUR, 15, 17) ~ "pm_peak",
      between(HOUR, 18, 20) ~ "evening",
      between(HOUR, 21, 23) ~ "late_night",
      between(HOUR, 0, 3) ~ "late_night",
      .default = "other"
    )
  )

wego
NA

tod_table = table(wego$time_of_day)
pt_tod_table <- prop.table(tod_table)
# tod_data <- as.data.frame(table(wego$time_of_day))
# colnames(tod_data) <- c("time of day", "count")

# tod_data
pt_tod_table

early_morning       evening    late_night        midday  morning_peak         other       pm_peak 
   0.03272224    0.12055936    0.09740419    0.36547452    0.16413139    0.03097748    0.18873082 

# Create the bar plot
# p2 <- ggplot(tod_table, aes(x = "time of day", y = "count", fill = "time_of_day")) +
#   geom_bar(stat = "identity") +
#   labs(y = "Number of late stops", title = "Distribution by Late Bus Stops") +
#   theme_minimal()
# p2
barplot(table(wego$time_of_day), main = "Time of day distribution")#, col = color)


table_tod <- pt_tod_table 
# Create a color vector
color <- rainbow(nrow(table_tod))
# Set the rotation for x-axis labels to 45 degrees
par(las=2)
# Create the vertically stacked bar plot
bp <- barplot(table_tod, main = "Time of day distribution", col = color)
# Add the legend
legend("topright", legend = rownames(table_tod),cex = 0.75, fill = color)

# Add x-axis labels with a 45 degree angle
axis(1, at=bp, labels=colnames(table_tod), las=2, cex.axis=2)
Error in dimnames(x)[[2L]] : subscript out of bounds

late_tod <- table(wego$time_of_day, wego$ADJUSTED_LATE_COUNT)
# Create a color vector
color <- rainbow(nrow(late_tod))
# Set the rotation for x-axis labels to 45 degrees
par(las=2)
# Create the vertically stacked bar plot
bp <- barplot(late_tod, main = "Late bus dist", col = color)
# Add the legend
legend("topright", legend = rownames(late_tod),cex = 0.9, fill = color)
# Add x-axis labels with a 45 degree angle
axis(1, at=bp, labels=colnames(late_tod), las=2, cex.axis=1)

LS0tDQp0aXRsZTogIlIgTm90ZWJvb2siDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQpUaGlzIGlzIGFuIFtSIE1hcmtkb3duXShodHRwOi8vcm1hcmtkb3duLnJzdHVkaW8uY29tKSBOb3RlYm9vay4gV2hlbiB5b3UgZXhlY3V0ZSBjb2RlIHdpdGhpbiB0aGUgbm90ZWJvb2ssIHRoZSByZXN1bHRzIGFwcGVhciBiZW5lYXRoIHRoZSBjb2RlLiANCg0KVHJ5IGV4ZWN1dGluZyB0aGlzIGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqUnVuKiBidXR0b24gd2l0aGluIHRoZSBjaHVuayBvciBieSBwbGFjaW5nIHlvdXIgY3Vyc29yIGluc2lkZSBpdCBhbmQgcHJlc3NpbmcgKkN0cmwrU2hpZnQrRW50ZXIqLiANCg0KYGBge3J9DQoNCg0KDQpgYGANCg0KQWRkIGEgbmV3IGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqSW5zZXJ0IENodW5rKiBidXR0b24gb24gdGhlIHRvb2xiYXIgb3IgYnkgcHJlc3NpbmcgKkN0cmwrQWx0K0kqLg0KDQpXaGVuIHlvdSBzYXZlIHRoZSBub3RlYm9vaywgYW4gSFRNTCBmaWxlIGNvbnRhaW5pbmcgdGhlIGNvZGUgYW5kIG91dHB1dCB3aWxsIGJlIHNhdmVkIGFsb25nc2lkZSBpdCAoY2xpY2sgdGhlICpQcmV2aWV3KiBidXR0b24gb3IgcHJlc3MgKkN0cmwrU2hpZnQrSyogdG8gcHJldmlldyB0aGUgSFRNTCBmaWxlKS4NCg0KVGhlIHByZXZpZXcgc2hvd3MgeW91IGEgcmVuZGVyZWQgSFRNTCBjb3B5IG9mIHRoZSBjb250ZW50cyBvZiB0aGUgZWRpdG9yLiBDb25zZXF1ZW50bHksIHVubGlrZSAqS25pdCosICpQcmV2aWV3KiBkb2VzIG5vdCBydW4gYW55IFIgY29kZSBjaHVua3MuIEluc3RlYWQsIHRoZSBvdXRwdXQgb2YgdGhlIGNodW5rIHdoZW4gaXQgd2FzIGxhc3QgcnVuIGluIHRoZSBlZGl0b3IgaXMgZGlzcGxheWVkLg0KDQpgYGB7cn0NCmxpYnJhcnkodGlkeXZlcnNlKQ0KIyBpbnN0YWxsIGZvciB2aXN1YWxpemF0aW9ucyANCmxpYnJhcnkoZ2dwbG90MikNCiMgaW5zdGFsbCB0byBjb21iaW5lIGRhdGUgYW5kIHRpbWUNCmxpYnJhcnkobHVicmlkYXRlKQ0KDQp3ZWdvIDwtIHJlYWRfY3N2KCIuLi9kYXRhL1JvdXRlIDUwIFRpbWVwb2ludCBhbmQgSGVhZHdheSBEYXRhLCAxLTEtMjAyMyB0aHJvdWdoIDUtMTItMjAyNS5jc3YiKQ0KDQpgYGANCmBgYHtyfQ0Kd2Vnbw0KYGBgDQoNCmBgYHtyfQ0KIyBDcmVhdGUgbmV3IGRhdGUgdGltZSBjb2x1bW4NCndlZ28kREFURV9USU1FIDwtIHltZCh3ZWdvJERBVEUpICsgaG1zKHdlZ28kU0NIRURVTEVEX1RJTUUpDQoNCiMgRXhhbWluZSBEYXRhDQp3ZWdvDQpgYGANCg0KYGBge3J9DQoNCg0KIyBGaWx0ZXIgRmVicnVhcnkgVFNQIHZhbHVlcw0KZmViM18xMF90c3AgPC0gd2VnbyB8PiANCiAgZmlsdGVyKGJldHdlZW4oREFURV9USU1FLCANCiAgICAgICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wMi0wMyAxMjowMDowMCIpLCANCiAgICAgICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wMi0xMCAxMjowMDowMCIpKSkNCg0KIyBGaWx0ZXIgRmViLUFwciBUU1Agd2l0aCBidXNzZXMgb25seSAyIG1pbnV0ZXMgbGF0ZSBvciBtb3JlDQpmZWIxMF9hcHIyOF90c3AgPC0gd2VnbyB8PiANCiAgZmlsdGVyKGJldHdlZW4oREFURV9USU1FLCANCiAgICAgICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wMi0xMCAxMjowMDowMCIpLCANCiAgICAgICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wNC0yOCAxMjowMDowMCIpKSkgfD4gDQogIGZpbHRlcihBREhFUkVOQ0UgPD0gLTIpDQoNCiMgRmlsdGVyIE1heSBUU1AgdmFsdWVzDQptYXk1XzEyX3RzcCA8LSB3ZWdvIHw+IA0KICBmaWx0ZXIoYmV0d2VlbihEQVRFX1RJTUUsIA0KICAgICAgICAgICAgICAgICBhcy5EYXRlKCIyMDI1LTA1LTA1IDEyOjAwOjAwIiksIA0KICAgICAgICAgICAgICAgICBhcy5EYXRlKCIyMDI1LTA1LTEyIDEyOjAwOjAwIikpKQ0KDQogIA0KYGBgDQoNCg0KDQoNCmBgYHtyfQ0KDQojIEFkZCBkYXkgb2Ygd2VlayBjb2x1bW4NCndlZ28gPC0gd2VnbyB8Pg0KICBtdXRhdGUoDQogICAgREFURV9USU1FID0gYXMuUE9TSVhjdChEQVRFX1RJTUUpLA0KICAgIERBWV9PRl9XRUVLID0gd2RheShEQVRFX1RJTUUsIA0KICAgICAgICAgICAgICAgICAgICAgICBsYWJlbCA9IFRSVUUsIA0KICAgICAgICAgICAgICAgICAgICAgICBhYmJyID0gRkFMU0UpKQ0KDQp3ZWdvDQoNCmBgYA0KDQoNCmBgYHtyfQ0KDQojIENvbWJpbmUgdHNwIHZhcmlhYmxlcyBpbnRvIG9uZSANCnRzcF9yb3dzIDwtIGJpbmRfcm93cygNCiAgZmViM18xMF90c3AsDQogIGZlYjEwX2FwcjI4X3RzcCwNCiAgbWF5NV8xMl90c3ANCikgfD4gDQogIHNlbGVjdCgnQURIRVJFTkNFX0lEJywgJ0RBVEVfVElNRScpIHw+IA0KICBkaXN0aW5jdCgpIHw+IA0KICBtdXRhdGUodHNwID0gMSkgICMgQWRkIHRzcCBpbmRpY2F0b3IgY29sdW1uIGZvciBlYWNoIGRpc3RpbmN0IGFkaGVyZW5jZSBpZA0KDQp3ZWdvIDwtIHdlZ28gfD4gDQogIGxlZnRfam9pbigNCiAgICB0c3Bfcm93cywNCiAgICBieSA9IGMoJ0FESEVSRU5DRV9JRCcsICdEQVRFX1RJTUUnKQ0KICApIHw+IA0KICBtdXRhdGUodHNwID0gY29hbGVzY2UodHNwLCAwKSkNCg0KYGBgDQoNCg0KYGBge3J9DQoNCndlZ28gfD4gdmlldygpDQoNCg0KYGBgDQoNCg0KYGBge3J9DQoNCndlZ28gPC0gd2VnbyB8PiAgbXV0YXRlKA0KICB0c3BfaW5kaWNhdG9yID0gaWZfZWxzZSgNCiAgICBiZXR3ZWVuKERBVEVfVElNRSwgDQogICAgICAgICAgICBhcy5EYXRlKCIyMDI1LTAyLTAzIDEyOjAwOjAwIiksIA0KICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wMi0xMCAxMjowMDowMCIpKSB8DQogICAgKGJldHdlZW4oREFURV9USU1FLCANCiAgICAgICAgICAgIGFzLkRhdGUoIjIwMjUtMDItMTAgMTI6MDA6MDAiKSwgDQogICAgICAgICAgICBhcy5EYXRlKCIyMDI1LTA0LTI4IDEyOjAwOjAwIikpICYNCiAgICAgICBBREhFUkVOQ0UgPD0gLTIpIHwNCiAgICBiZXR3ZWVuKERBVEVfVElNRSwgDQogICAgICAgICAgICBhcy5EYXRlKCIyMDI1LTA1LTA1IDEyOjAwOjAwIiksIA0KICAgICAgICAgICAgYXMuRGF0ZSgiMjAyNS0wNS0xMiAxMjowMDowMCIpKSwgMSwgMCkNCiAgICANCiAgKQ0KDQp3ZWdvDQoNCmBgYA0KDQpgYGB7cn0NCndlZ28gPC0gd2VnbyB8PiBtdXRhdGUoDQogIEhPVVIgPSBobXMoU0NIRURVTEVEX1RJTUUpIHw+IA0KICAgIGhvdXIoKQ0KICApDQoNCmBgYA0KDQpgYGB7cn0NCg0Kd2VnbyA8LSB3ZWdvIHw+DQogIG11dGF0ZSgNCiAgICB0aW1lX29mX2RheSA9IGNhc2Vfd2hlbigNCiAgICAgIGJldHdlZW4oSE9VUiwgNCwgNSkgfiAiZWFybHlfbW9ybmluZyIsDQogICAgICBiZXR3ZWVuKEhPVVIsIDYsIDgpIH4gIm1vcm5pbmdfcGVhayIsDQogICAgICBiZXR3ZWVuKEhPVVIsIDksIDE0KSB+ICJtaWRkYXkiLA0KICAgICAgYmV0d2VlbihIT1VSLCAxNSwgMTcpIH4gInBtX3BlYWsiLA0KICAgICAgYmV0d2VlbihIT1VSLCAxOCwgMjApIH4gImV2ZW5pbmciLA0KICAgICAgYmV0d2VlbihIT1VSLCAyMSwgMjMpIH4gImxhdGVfbmlnaHQiLA0KICAgICAgYmV0d2VlbihIT1VSLCAwLCAzKSB+ICJsYXRlX25pZ2h0IiwNCiAgICAgIC5kZWZhdWx0ID0gIm90aGVyIg0KICAgICkNCiAgKQ0KDQp3ZWdvDQoNCmBgYA0KDQpgYGB7cn0NCg0KdG9kX3RhYmxlID0gdGFibGUod2VnbyR0aW1lX29mX2RheSkNCnB0X3RvZF90YWJsZSA8LSBwcm9wLnRhYmxlKHRvZF90YWJsZSkNCiMgdG9kX2RhdGEgPC0gYXMuZGF0YS5mcmFtZSh0YWJsZSh3ZWdvJHRpbWVfb2ZfZGF5KSkNCiMgY29sbmFtZXModG9kX2RhdGEpIDwtIGMoInRpbWUgb2YgZGF5IiwgImNvdW50IikNCg0KIyB0b2RfZGF0YQ0KcHRfdG9kX3RhYmxlDQoNCmBgYA0KDQoNCmBgYHtyfQ0KDQojIENyZWF0ZSB0aGUgYmFyIHBsb3QNCiMgcDIgPC0gZ2dwbG90KHRvZF90YWJsZSwgYWVzKHggPSAidGltZSBvZiBkYXkiLCB5ID0gImNvdW50IiwgZmlsbCA9ICJ0aW1lX29mX2RheSIpKSArDQojICAgZ2VvbV9iYXIoc3RhdCA9ICJpZGVudGl0eSIpICsNCiMgICBsYWJzKHkgPSAiTnVtYmVyIG9mIGxhdGUgc3RvcHMiLCB0aXRsZSA9ICJEaXN0cmlidXRpb24gYnkgTGF0ZSBCdXMgU3RvcHMiKSArDQojICAgdGhlbWVfbWluaW1hbCgpDQojIHAyDQpiYXJwbG90KHRhYmxlKHdlZ28kdGltZV9vZl9kYXkpLCBtYWluID0gIlRpbWUgb2YgZGF5IGRpc3RyaWJ1dGlvbiIpIywgY29sID0gY29sb3IpDQoNCmBgYA0KDQoNCmBgYHtyfQ0KDQp0YWJsZV90b2QgPC0gcHRfdG9kX3RhYmxlIA0KIyBDcmVhdGUgYSBjb2xvciB2ZWN0b3INCmNvbG9yIDwtIHJhaW5ib3cobnJvdyh0YWJsZV90b2QpKQ0KIyBTZXQgdGhlIHJvdGF0aW9uIGZvciB4LWF4aXMgbGFiZWxzIHRvIDQ1IGRlZ3JlZXMNCnBhcihsYXM9MikNCiMgQ3JlYXRlIHRoZSB2ZXJ0aWNhbGx5IHN0YWNrZWQgYmFyIHBsb3QNCmJwIDwtIGJhcnBsb3QodGFibGVfdG9kLCBtYWluID0gIlRpbWUgb2YgZGF5IGRpc3RyaWJ1dGlvbiIsIGNvbCA9IGNvbG9yKQ0KIyBBZGQgdGhlIGxlZ2VuZA0KbGVnZW5kKCJ0b3ByaWdodCIsIGxlZ2VuZCA9IHJvd25hbWVzKHRhYmxlX3RvZCksY2V4ID0gMC43NSwgZmlsbCA9IGNvbG9yKQ0KIyBBZGQgeC1heGlzIGxhYmVscyB3aXRoIGEgNDUgZGVncmVlIGFuZ2xlDQpheGlzKDEsIGF0PWJwLCBsYWJlbHM9Y29sbmFtZXModGFibGVfdG9kKSwgbGFzPTIsIGNleC5heGlzPTIpDQoNCmBgYA0KDQoNCmBgYHtyfQ0KDQpsYXRlX3RvZCA8LSB0YWJsZSh3ZWdvJHRpbWVfb2ZfZGF5LCB3ZWdvJEFESlVTVEVEX0xBVEVfQ09VTlQpDQojIENyZWF0ZSBhIGNvbG9yIHZlY3Rvcg0KY29sb3IgPC0gcmFpbmJvdyhucm93KGxhdGVfdG9kKSkNCiMgU2V0IHRoZSByb3RhdGlvbiBmb3IgeC1heGlzIGxhYmVscyB0byA0NSBkZWdyZWVzDQpwYXIobGFzPTIpDQojIENyZWF0ZSB0aGUgdmVydGljYWxseSBzdGFja2VkIGJhciBwbG90DQpicCA8LSBiYXJwbG90KGxhdGVfdG9kLCBtYWluID0gIkxhdGUgYnVzIGRpc3QiLCBjb2wgPSBjb2xvcikNCiMgQWRkIHRoZSBsZWdlbmQNCmxlZ2VuZCgidG9wcmlnaHQiLCBsZWdlbmQgPSByb3duYW1lcyhsYXRlX3RvZCksY2V4ID0gMC45LCBmaWxsID0gY29sb3IpDQojIEFkZCB4LWF4aXMgbGFiZWxzIHdpdGggYSA0NSBkZWdyZWUgYW5nbGUNCmF4aXMoMSwgYXQ9YnAsIGxhYmVscz1jb2xuYW1lcyhsYXRlX3RvZCksIGxhcz0yLCBjZXguYXhpcz0xKQ0KDQpgYGANCg0KDQpgYGB7cn0NCmBgYA0KDQoNCmBgYHtyfQ0KYGBgDQoNCg0KDQoNCg0KDQoNCg==